import pandas as pd

df = pd.DataFrame()

for c in [100, 500, 1000, 2000]:
    df_check = pd.read_csv('../data/human_validation/cluster_validation_{0}.csv'.format(c))
    df_check['cluster'] = c
    df = df.append(df_check)

df = df.sample(len(df))
df.to_csv('../data/human_validation/cluster_validation_all.csv'.format(c), index=False)
df[['ARG', 'ARG-RAW', 'similarity']].to_csv('../data/human_validation/cluster_validation_all_send_out.csv', index=False)
